@article{carey1978acquiring,
  title={Acquiring a single new word.},
  author={Carey, Susan and Bartlett, Elsa},
  year={1978},
  publisher={ERIC}
}
@article{fei2006one,
  title={One-shot learning of object categories},
  author={Li, Fei-Fei and Fergus, Rob and Perona, Pietro},
  journal={PAMI},
  volume={28},
  number={4},
  pages={594--611},
  year={2006},
  publisher={IEEE}
}
@inproceedings{lake2013one,
  title={One-shot learning by inverting a compositional causal process},
  author={Lake, Brenden M and Salakhutdinov, Ruslan R and Tenenbaum, Josh},
  booktitle={NIPS},
  pages={2526--2534},
  year={2013}
}
@incollection{thrun1998lifelong,
  title={Lifelong learning algorithms},
  author={Thrun, Sebastian},
  booktitle={Learning to learn},
  pages={181--209},
  year={1998},
  publisher={Springer}
}
@article{schmidhuber1997shifting,
  title={Shifting inductive bias with success-story algorithm, adaptive Levin search, and incremental self-improvement},
  author={Schmidhuber, J{\"u}rgen and Zhao, Jieyu and Wiering, Marco},
  journal={Machine Learning},
  volume={28},
  number={1},
  pages={105--130},
  year={1997},
  publisher={Springer}
}
@article{hochreiter1997long,
  title={Long short-term memory},
  author={Hochreiter, Sepp and Schmidhuber, J{\"u}rgen},
  journal={Neural computation},
  volume={9},
  number={8},
  pages={1735--1780},
  year={1997},
  publisher={MIT Press}
}
@inproceedings{yuxiongwang2017imaginary,
  Author    = {Yu-Xiong Wang and Ross Girshick and
               Martial Hebert and Bharath Hariharan},
  Title     = {{Low-Shot Learning from Imaginary Data}},
  Booktitle = {{CVPR}},
  Year      = {2018}
}
@article{ren2018meta,
  title={Meta-Learning for Semi-Supervised Few-Shot Classification},
  author={Ren, Mengye and Triantafillou, Eleni and Ravi, Sachin and Snell, Jake and Swersky, Kevin and Tenenbaum, Joshua B and Larochelle, Hugo and Zemel, Richard S},
  journal={arXiv preprint arXiv:1803.00676},
  year={2018}
}

@inproceedings{koch2015siamese,
  title={Siamese neural networks for one-shot image recognition},
  author={Koch, Gregory and Zemel, Richard and Salakhutdinov, Ruslan},
  booktitle={ICML Deep Learning Workshop},
  volume={2},
  year={2015}
}
@inproceedings{hadsell2006dimensionality,
  title={Dimensionality reduction by learning an invariant mapping},
  author={Hadsell, Raia and Chopra, Sumit and LeCun, Yann},
  booktitle={CVPR},
  volume={2},
  pages={1735--1742},
  year={2006},
  organization={IEEE}
}
@inproceedings{fink2005object,
  title={Object classification from a single example utilizing class relevance metrics},
  author={Fink, Michael},
  booktitle={NIPS},
  pages={449--456},
  year={2005}
}
@inproceedings{schroff2015facenet,
  title={Facenet: A unified embedding for face recognition and clustering},
  author={Schroff, Florian and Kalenichenko, Dmitry and Philbin, James},
  booktitle={CVPR},
  pages={815--823},
  year={2015}
}
@inproceedings{taigman2015web,
  title={Web-scale training for face identification},
  author={Taigman, Yaniv and Yang, Ming and Ranzato, Marc'Aurelio and Wolf, Lior},
  booktitle={CVPR},
  pages={2746--2754},
  year={2015}
}
@inproceedings{shyam2017attentive,
  title={Attentive Recurrent Comparators},
  author={Shyam, Pranav and Gupta, Shubham and Dukkipati, Ambedkar},
  booktitle={ICML},
  pages={3173--3181},
  year={2017}
}

@article{He2016Deep,
  title={Deep Residual Learning for Image Recognition},
  author={Kaiming He and Xiangyu Zhang and Shaoqing Ren and Jian Sun},
  journal={CVPR},
  year={2016},
  pages={770--778}
}

@inproceedings{Ramachandran2017searching,
    author = {Prajit Ramachandran and Barret Zoph and Quoc V. Lea},
    year = {2018},
    pages = {},
    title = {Searching for Activation Functions},
    booktitle={ICLR},
}


@inproceedings{Szegedy2015going,
    title = {Going Deeper with Convolutions},
    author  = {Christian Szegedy and Wei Liu and Yangqing Jia and Pierre Sermanet and Scott Reed and Dragomir Anguelov and Dumitru Erhan and Vincent Vanhoucke and Andrew Rabinovich},
    year  = {2015},
    booktitle = {CVPR}
}

@article{bileh2017universal,
    author = {Bilen, Hakan and Vedaldi, Andrea},
    year = {2017},
    month = {01},
    pages = {},
    title = {Universal representations: The missing link between faces, text, planktons, and cat breeds},
    journal={arXiv preprint arXiv:1701.07275},
}


@InProceedings{Santoro16metalearning,
  title = 	 {Meta-Learning with Memory-Augmented Neural Networks},
  author = 	 {Adam Santoro and Sergey Bartunov and Matthew Botvinick and Daan Wierstra and Timothy Lillicrap},
  booktitle = 	 {ICML},
  pages = 	 {1842--1850},
  year = 	 {2016},
  editor = 	 {Maria Florina Balcan and Kilian Q. Weinberger},
  volume = 	 {48},
  series = 	 {Proceedings of Machine Learning Research},
  address = 	 {New York, New York, USA},
  month = 	 {20--22 Jun},
  publisher = 	 {PMLR},
}


@inproceedings{mishra2018simle,
    title={A Simple Neural Attentive Meta-Learner},
    author={Nikhil Mishra and Mostafa Rohaninejad and Xi Chen and Pieter Abbeel},
    booktitle={ICLR},
    year={2018}
}


@article{Lacoste2018deepprior,
  title={Deep Prior},
  author={Alexandre Lacoste and Thomas Boquet and Negar Rostamzadeh and Boris Oreshkin and Wonchang Chung and David Krueger},
  journal={arXiv preprint arXiv:1712.05016},
  year={2017}
}


@techreport{Krizhevsky2009learning,
  title={Learning Multiple Layers of Features from Tiny Images},
  author={Krizhevsky, Alex},
  year={2009},
  institution={University of Toronto},
  type={~}
}


@inproceedings{sung2018learning,
    author = {Sung, Flood and Yang, Yongxin and Zhang, Li and Xiang, Tao and Torr, Philip HS and Hospedales, Timothy M},
    title = {Learning to Compare: Relation Network for Few-Shot Learning},
    booktitle = {CVPR},
    year = {2018},
    pages = {},
    numpages = {},
    publisher = {},
    address = {}
} 


@article{Bauer2017discriminative,
  title={Discriminative k-shot learning using probabilistic models},
  author={Matthias Bauer and Mateo Rojas-Carulla and Jakub Bartłomiej Świątkowski and Bernhard Schölkopf and Richard E. Turner},
  journal={arXiv preprint arXiv:1706.00326},
  year={2017}
}


@inproceedings{Xing2002metric,
    author = {Xing, Eric P. and Ng, Andrew Y. and Jordan, Michael I. and Russell, Stuart},
    title = {Distance Metric Learning, with Application to Clustering with Side-information},
    booktitle = {NIP},
    series = {NIPS'02},
    year = {2002},
    pages = {521--528},
    numpages = {8},
    acmid = {2968683},
    publisher = {MIT Press},
    address = {Cambridge, MA, USA}
} 


@article{Dumoulin2017learned,
    title = {A Learned Representation For Artistic Style},
    author  = {Vincent Dumoulin and Jonathon Shlens and Manjunath Kudlur},
    year  = {2017},
    journal = {ICLR}
}


@article{Perez2017LearningVR,
  title={Learning Visual Reasoning Without Strong Priors},
  author={Ethan Perez and Harm de Vries and Florian Strub and Vincent Dumoulin and Aaron C. Courville},
  journal={CoRR},
  year={2017},
  volume={abs/1707.03017}
}
@inproceedings{munkhdalai2018rapid,
  title={Rapid Adaptation with Conditionally Shifted Neurons},
  author={Tsendsuren Munkhdalai and Xingdi Yuan and Soroush Mehri and Adam Trischler},
  booktitle={ICML},
  year={2018}
}
@inproceedings{vaswani2017attention,
  title={Attention is all you need},
  author={Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, {\L}ukasz and Polosukhin, Illia},
  booktitle={NIPS},
  pages={6000--6010},
  year={2017}
}

@article{rippel2015metric,
  title={Metric learning with adaptive density discrimination},
  author={Rippel, Oren and Paluri, Manohar and Dollar, Piotr and Bourdev, Lubomir},
  journal={arXiv preprint arXiv:1511.05939},
  year={2015}
}
@inproceedings{perez2017film,
  title={Film: Visual reasoning with a general conditioning layer},
  author={Perez, Ethan and Strub, Florian and De Vries, Harm and Dumoulin, Vincent and Courville, Aaron},
  booktitle={AAAI},
  year={2018}
}

@inproceedings{devries2017modulating,
    author = {de Vries, Harm and Strub, Florian and Mary, Jeremie and Larochelle, Hugo and Pietquin, Olivier and Courville, Aaron},
    title = {Modulating early visual processing by language},
    booktitle = {NIPS},
    year = {2017},
    pages = {6597--6607}
}

@inproceedings{finn2017model,
  title = 	 {Model-Agnostic Meta-Learning for Fast Adaptation of Deep Networks},
  author = 	 {Chelsea Finn and Pieter Abbeel and Sergey Levine},
  booktitle = {ICML},
  pages = 	 {1126--1135},
  year = 	 {2017}
}

@inproceedings{snell2017prototypical,
    author    = {Jake Snell and
               Kevin Swersky and
               Richard S. Zemel},
    title     = {Prototypical Networks for Few-shot Learning},
    booktitle = {NIPS},
    pages     = {4080--4090},
    year      = {2017}
}

@incollection{vinyals2016matching,
    title = {Matching Networks for One Shot Learning},
    author = {Oriol Vinyals and Blundell, Charles and Lillicrap, Tim and Kavukcuoglu, Koray and Wierstra, Daan},
    booktitle = {NIPS},
    pages = {3630--3638},
    year = {2016},
}

@inproceedings{welling2011bayesian,
  title={Bayesian learning via stochastic gradient Langevin dynamics},
  author={Welling, Max and Teh, Yee W},
  booktitle={ICML},
  pages={681--688},
  year={2011}
}

@inproceedings{kingma2016improving,
  title={Improving variational inference with inverse autoregressive flow},
  author={Kingma, Diederik P and Salimans, Tim and Welling, Max},
  booktitle={NIPS},
  year={2016}
}

@article{kingma2013auto,
  title={Auto-encoding variational bayes},
  author={Kingma, Diederik P and Welling, Max},
  journal={arXiv preprint arXiv:1312.6114},
  year={2013}
}

@article{ba2016layer,
  title={Layer normalization},
  author={Ba, Jimmy Lei and Kiros, Jamie Ryan and Hinton, Geoffrey E},
  journal={arXiv preprint arXiv:1607.06450},
  year={2016}
}

@inproceedings{blundell2015weight,
  title={Weight Uncertainty in Neural Network},
  author={Blundell, Charles and Cornebise, Julien and Kavukcuoglu, Koray and Wierstra, Daan},
  booktitle={ICML},
  pages={1613--1622},
  year={2015}
}

@inproceedings{kingma2015variational,
  title={Variational dropout and the local reparameterization trick},
  author={Kingma, Diederik P and Salimans, Tim and Welling, Max},
  booktitle={NIPS},
  pages={2575--2583},
  year={2015}
}

@inproceedings{gal2016dropout,
  title={Dropout as a Bayesian approximation: Representing model uncertainty in deep learning},
  author={Gal, Yarin and Ghahramani, Zoubin},
  booktitle={ICML},
  pages={1050--1059},
  year={2016}
}

@article{krueger2017bayesian,
  title={Bayesian Hypernetworks},
  author={Krueger, David and Huang, Chin-Wei and Islam, Riashat and Turner, Ryan and Lacoste, Alexandre and Courville, Aaron},
  journal={arXiv preprint arXiv:1710.04759},
  year={2017}
}

@inproceedings{gal2017deep,
  title={Deep Bayesian Active Learning with Image Data},
  author={Gal, Yarin and Islam, Riashat and Ghahramani, Zoubin},
  booktitle={ICML},
  pages={1183--1192},
  year={2017}
}

@inproceedings{goodfellow2014generative,
  title={Generative adversarial nets},
  author={Goodfellow, Ian and Pouget-Abadie, Jean and Mirza, Mehdi and Xu, Bing and Warde-Farley, David and Ozair, Sherjil and Courville, Aaron and Bengio, Yoshua},
  booktitle={NIPS},
  pages={2672--2680},
  year={2014}
}

@article{edwards2016towards,
  title={Towards a neural statistician},
  author={Edwards, Harrison and Storkey, Amos},
  journal={arXiv preprint arXiv:1606.02185},
  year={2016}
}

@inproceedings{ravi2016optimization,
  title={Optimization as a model for few-shot learning},
  author={Ravi, Sachin and Larochelle, Hugo},
  booktitle={ICLR},
  year={2016}
}

@inproceedings{arjovsky2017towards,
  title={Towards principled methods for training generative adversarial networks},
  author={Arjovsky, Martin and Bottou, L{\'e}on},
  booktitle={ICLR},
  year={2017}
}

@article{grunwald2007suboptimal,
  title={Suboptimal behavior of Bayes and MDL in classification under misspecification},
  author={Gr{\"u}nwald, Peter and Langford, John},
  journal={Machine Learning},
  volume={66},
  number={2-3},
  pages={119--149},
  year={2007},
  publisher={Springer}
}

@inproceedings{snoek2012practical,
  title={Practical bayesian optimization of machine learning algorithms},
  author={Snoek, Jasper and Larochelle, Hugo and Adams, Ryan P},
  booktitle={NIPS},
  pages={2951--2959},
  year={2012}
}


@article{kirkpatrick2017overcoming,
  title={Overcoming catastrophic forgetting in neural networks},
  author={Kirkpatrick, James and Pascanu, Razvan and Rabinowitz, Neil and Veness, Joel and Desjardins, Guillaume and Rusu, Andrei A and Milan, Kieran and Quan, John and Ramalho, Tiago and Grabska-Barwinska, Agnieszka and others},
  journal={PNAS},
  volume={114},
  number={13},
  pages={3521--3526},
  year={2017},
  publisher={National Acad Sciences}
}

@inproceedings{berkenkamp2017safe,
  title={Safe model-based reinforcement learning with stability guarantees},
  author={Berkenkamp, Felix and Turchetta, Matteo and Schoellig, Angela and Krause, Andreas},
  booktitle={NIPS},
  pages={908--919},
  year={2017}
}

@inproceedings{houthooft2016vime,
  title={Vime: Variational information maximizing exploration},
  author={Houthooft, Rein and Chen, Xi and Duan, Yan and Schulman, John and De Turck, Filip and Abbeel, Pieter},
  booktitle={NIPS},
  pages={1109--1117},
  year={2016}
}

@incollection{rasmussen2004gaussian,
  title={Gaussian processes in machine learning},
  author={Rasmussen, Carl Edward},
  booktitle={Advanced lectures on machine learning},
  pages={63--71},
  year={2004},
  publisher={Springer}
}

@inproceedings{damianou2013deep,
  title={Deep gaussian processes},
  author={Damianou, Andreas and Lawrence, Neil},
  booktitle={AISTAT},
  pages={207--215},
  year={2013}
}

@inproceedings{germain2015made,
  title={Made: Masked autoencoder for distribution estimation},
  author={Germain, Mathieu and Gregor, Karol and Murray, Iain and Larochelle, Hugo},
  booktitle={ICML},
  pages={881--889},
  year={2015}
}

@inproceedings{louizos2017multiplicative,
  title={Multiplicative Normalizing Flows for Variational Bayesian Neural Networks},
  author={Louizos, Christos and Welling, Max},
  booktitle={ICML},
  pages={2218--2227},
  year={2017}
}

@article{gal2016uncertainty,
  title={Uncertainty in deep learning},
  author={Gal, Yarin},
  journal={University of Cambridge},
  year={2016}
}

@article{ganin2016domain,
  title={Domain-adversarial training of neural networks},
  author={Ganin, Yaroslav and Ustinova, Evgeniya and Ajakan, Hana and Germain, Pascal and Larochelle, Hugo and Laviolette, Fran{\c{c}}ois and Marchand, Mario and Lempitsky, Victor},
  journal={JMLR},
  volume={17},
  number={1},
  pages={2096--2030},
  year={2016},
  publisher={JMLR. org}
}

